home *** CD-ROM | disk | FTP | other *** search
/ MacAddict 108 / MacAddict108.iso / Software / Internet & Communication / JunkMatcher 1.5.5.dmg / JunkMatcher.app / Contents / Resources / Defaults / patterns < prev    next >
Encoding:
Text File  |  2005-06-01  |  15.4 KB  |  703 lines

  1. "(?i)(?#f-)(?#o-)(?#r-)(?#w-)(?#a-)(?#r-)(?#d-)\W(?#l-)(?#o-){2}(?#k-)(?#i-)(?#n-)(?#g-)\s+(?#s-)(?#t-)(?#a-)(?#t-)(?#e-)(?#m-)(?#e-)(?#n-)(?#t-)"
  2. "Stock news disclaimer I"
  3. M
  4. ""
  5. ""
  6. body 10135.322756 1 556 0 485
  7.  
  8. "(?i)[a-z]+(?:[~^`]+[a-z]+){2,}"
  9. "Punctuated words"
  10. M
  11. ""
  12. ""
  13. body 2008.533953 0 555 0 450
  14. rendering 2143.412495 0 14 0 75
  15. subject 544.773335 0 585 0 11376
  16.  
  17. "(?i)(?:(?#m-)(?#a-)(?#n-)(?#h-)(?#o-)(?#o-)d|(?#a-)(?#l-)(?#p-)(?#h-)(?#a-)\s+(?#m-)(?#a-)(?#l-)(?#e-)|(?#p-)(?#o-)(?#t-)(?#e-)(?#n-)(?#c-)(?#y-))"
  18. "Manhood/alpha male/potency"
  19. M
  20. ""
  21. ""
  22. body 733.428309 6 556 0 500
  23. rendering 467.621147 0 14 0 70
  24. subject 2384.396306 2 585 0 11393
  25.  
  26. "(?i)(?:(?#f-)(?#r-)(?#e-)(?#e-)(?:\s+\S+)?\s+(?:(?#s-)(?#h-)(?#i-)(?#p-)(?#p-)|(?#d-)(?#e-)(?#l-)(?#i-)(?#v-)|(?#m-)(?#e-)(?#m-)(?#b-)(?#e-)(?#r-)(?#s-)(?#h-))|get (?:\S+ ){,8}(?:and|&) save|limite(?#d-)time|(?:limited (?:time )?|promotion.+)(?#o-)ffer|(?:(?#b-)(?#u-)(?#y-)|call|get (?:yours|it|them)) (?:n(?#o-)w|t(?#o-)day)|(?:1(?:\W|_)??0(?:\W|_)??0(?:\W|_)??%|satisfaction)\s+guaranteed?|all[\s-]natural|pre-?\s?qualified|(?:z(?#e-)(?#r-)(?#o-)|[0o])\s+payment|mone(?#y-)back)"
  27. "Free shipp(ing)/delive(ery)/membersh(ip), get x and save/limited time/promotional offer, buy/call/get yours now/today, x%/satisfaction guarantted, pre-qualified, zero payment, money-back"
  28. M
  29. ""
  30. ""
  31. body 3545.890484 22 559 0 615
  32. rendering 1818.878310 0 14 0 70
  33. subject 4535.301838 37 588 0 11605
  34.  
  35. "(?i)(?#<_)font[^>]+(?:color="?(?:#?(?:FFFF|F.F.F.)|white))"
  36. "White font"
  37. M
  38. ""
  39. ""
  40. body 3268.050497 2 15 0 130
  41.  
  42. "(?i)(?:http://[^> ]*|[\w_]+(?:\.[\w_]+){2,4})\.(?:biz|cx|to)\b"
  43. ".biz/.cx/.to sites"
  44. M
  45. ""
  46. ""
  47. body 3848.389268 14 562 0 610
  48.  
  49. "(?is)\b(?:(?#d-)(?#a-)(?#t-)|(?#c-)(?#h-)(?#e-)(?#a-)(?#t-)|(?#l-)(?#o-)(?#n-)(?#e-)).+(?:(?#h-)(?#o-)(?#u-)(?#s-)(?#e-)?)?(?#w-)(?#i-)(?:(?#v-)|(?#f-))(?#e-)"
  50. "Dating/cheating/lonely and wives"
  51. M
  52. ""
  53. ""
  54. body 1124.095183 2 557 0 480
  55. subject 2338.134784 2 588 0 11403
  56.  
  57. "(?i)(?#e-)(?#n-)(?#l-)(?#a-)(?#r-)(?#g-)(?#e-)(?#m-)(?#e-)(?#n-)t"
  58. "Enlargement"
  59. M
  60. ""
  61. ""
  62. body 276.019188 0 555 0 460
  63. rendering 148.221346 0 14 0 75
  64. subject 1042.661373 1 585 0 11384
  65.  
  66. "(?i)\b(?:breast|tits|nipples?|pussy)"
  67. "Breast/tits/nipples/pussy"
  68. M
  69. ""
  70. ""
  71. body 591.073388 2 555 0 461
  72. subject 188.033930 1 585 0 11397
  73.  
  74. "(?i)\b(?#p-)(?#o-)(?#r-)(?#n-)"
  75. "Porn"
  76. M
  77. ""
  78. ""
  79. body 121.857959 2 556 0 503
  80. rendering 85.345723 0 14 0 74
  81. subject 391.059086 4 587 0 11412
  82.  
  83. "(?i)\.(?:exe|com)$"
  84. "Windoze executables"
  85. M
  86. ""
  87. ""
  88. filenames 73.150790 1 590 0 12924
  89.  
  90. "(?i)<a\s+[^>]+>\s*(?:<font[^>]*>\s*)?(?:no\W*more\W*(?:sending|\?)|remove|(?#t-)(?#a-)(?#k-)(?#e-)?\W*(?:(?#m-)(?#e-)\W*)?(?#o-)(?#f-)(?#f-)|(?#o-)(?#f-)(?#f-)|don\'?t\W*want|stop)"
  91. "Other phrases to unsubscribe"
  92. M
  93. ""
  94. ""
  95. body 26193.541573 0 14 0 91
  96.  
  97. "(?is)(?:st(?#o-)ck.+(?:(?#s-)(?#t-)(?#a-)(?#t-)(?#e-)(?#m-)(?#e-)(?#n-)(?#t-)|pick))"
  98. "Stock junk"
  99. M
  100. ""
  101. ""
  102. body 5506.876382 153 566 0 712
  103.  
  104. "(?i)(?:(?#d-)(?#r-)(?#u-)(?#g-)|(?#p-)(?#r-)(?#o-)(?#v-)(?#e-)(?#n-)\s+(?#f-)(?#o-)(?#r-)(?#m-)(?#u-))"
  105. "Drug related"
  106. M
  107. ""
  108. ""
  109. body 212.566273 0 66 0 45
  110. subject 2095.272238 1 69 0 1075
  111.  
  112. "(?i)(?:(?#c-)(?#a-)(?#b-)(?#l-)(?#e-)(?:(?#t-)(?#v-)|f(?#i-)(?#l-)t(?#e-)r)|(?#p-)(?#e-)(?#r-)(?#v-)(?#i-)(?#e-)(?#w-)|dvd\s+(?:movie|play))"
  113. "Cable TV/filter, (pay)-per-view, dvd movie/player"
  114. M
  115. ""
  116. ""
  117. body 764.684426 0 554 1 442
  118. subject 1913.210066 37 588 0 11577
  119.  
  120. "(?i)forged"
  121. "Forged headers"
  122. M
  123. ""
  124. ""
  125. headers 16226.149697 18 3 0 110
  126.  
  127. "(?i)(?#c-)(?#a-)(?#s-)(?#i-)(?#n-)"
  128. "Casino"
  129. M
  130. ""
  131. ""
  132. body 342.174010 2 66 0 53
  133. subject 1094.430019 0 69 0 1046
  134.  
  135. "(?i)(?:(?#j-)(?#o-)(?#i-)(?#n-)|(?#b-)(?#u-)(?#y-))\s+(?:now|today)"
  136. "Join/buy now/today"
  137. M
  138. ""
  139. ""
  140. body 4766.113026 1 556 0 464
  141.  
  142. " {5,}"
  143. "5+ consecutive spaces"
  144. M
  145. ""
  146. ""
  147. subject 51.185339 9 587 0 11543
  148.  
  149. "(?i)(?:(?#f-)(?#u-)(?#c-)k|(?#f-)(?#u-)(?#k-)(?#c))"
  150. "Swearing"
  151. M
  152. ""
  153. ""
  154. body 421.117862 0 555 0 454
  155. rendering 592.831815 0 14 0 75
  156. subject 882.658454 5 587 0 11419
  157.  
  158. "(?is)(?#<_)html\s*>.*(?#<_)body\s*>"
  159. "HTML tags in rendering"
  160. M
  161. ""
  162. ""
  163. rendering 882.249666 4 511 1 325
  164.  
  165. "(?i)\b(?:(?#p-)(?:(?:(?#i-)|(?#I-))(?#l-)(?#l-)(?#s-)?\b|(?#r-)(?#e-)(?#s-)(?#c-)(?#r-)(?:(?#i-)|(?#I-))(?#p-)(?#t-)(?:(?#i-)|(?#I-))(?#o-)(?#n)|(?#h-)(?#a-)(?#r-)(?#m-)(?#a-))|(?#m-)(?#e-)(?#d-)(?#i-)?(?:(?#s-)|(?#z-)))"
  166. "Pill(s)/prescription/pharma(cy)/meds"
  167. M
  168. ""
  169. ""
  170. body 670.142561 123 565 3 866
  171. rendering 378.474761 0 14 0 75
  172. subject 2924.749156 508 588 0 12365
  173.  
  174. "(?is)(?:(?:(?#f-)(?#r-)(?#e-)(?#e-)|special)\s+(?:(?#o-)(?#f-)(?#f-)(?#e-)(?#r)|(?#q-)(?#u-)(?#o-)(?#t-)(?#e))|sav(?:e|ings?\W+(?:of)?)\W+(?:up\W+to|over)\W+\S+%|get\W+\S+%\W*off|(?#b-)(?#u-)(?#y-).{,10}\S+%\W*(?#l-)(?:(?#e-)(?#s-)(?#s-)|(?#o-)(?#w-)))"
  175. "Free/special offer/quote / (save/savings (of)) (up to/over) x%; get x% off; buy xx x% less/low" "
  176. M
  177. ""
  178. ""
  179. body 13905.066914 11 561 1 584
  180. rendering 1948.830626 0 14 0 70
  181.  
  182. "(?i)(?#<_)img\s+[^>]*(?:low)?src\s*=\s*['"]?\s*http:"
  183. "External images"
  184. M
  185. ""
  186. ""
  187. body 3421.153526 405 15 9 532
  188.  
  189. "(?i)(?#myNames)"
  190. "My names (requires email addr. in Account preference of Mail.app)"
  191. M
  192. ""
  193. ""
  194. subject 295.174388 149 587 1 11823
  195.  
  196. "(?i)\b(?:(?#p-)(?#e-)(?#n-)(?:(?#i-)|(?#I-))(?#s)|(?#c-)(?#o-)(?#c-)k\b)"
  197. "Penis/cock"
  198. M
  199. ""
  200. ""
  201. body 262.266159 5 555 0 482
  202. rendering 147.562350 0 14 0 75
  203. subject 1041.357253 18 586 0 11394
  204.  
  205. "(?i)(?#<_)a\s+[^>]*href\s*=\s*"\s*mailto:"
  206. "Mailto"
  207. M
  208. ""
  209. ""
  210. body 2272.686826 0 14 1 94
  211.  
  212. "(?i)(?:(?#u-)(?#n-)(?#i-)(?#v-)(?:(?#e-)(?#r-)(?#s-)(?#i-)(?#t-)(?#y-))?|college)(?:\s*\W?\s*)(?:(?#d-)(?#i-)(?#p-)(?#l-)(?#o-)(?#m-)(?#a-)|(?#d-)(?#e-)(?#g-)(?#r-)(?#e-)(?#e-))"
  213. "University/college diploma/degree"
  214. M
  215. ""
  216. ""
  217. body 532.430557 3 557 0 539
  218. rendering 258.986872 0 14 0 75
  219. subject 2437.606510 15 585 0 11468
  220.  
  221. "(?i)(?#<_)body\s+[^>]*onload\s*="
  222. "Body tag with onload attribute"
  223. M
  224. ""
  225. ""
  226. body 3584.447452 0 13 0 48
  227.  
  228. "(?i)http://?(?:(?:%[a-f0-9]{2}){2,})"
  229. "Garbled URLs"
  230. M
  231. ""
  232. ""
  233. body 1001.252703 2 555 0 482
  234.  
  235. "(?i)(?#s-)(?#e-)(?#x-).+(?#e-)(?#x-)(?#p-)(?#l-)"
  236. "Sexually explicit"
  237. M
  238. ""
  239. ""
  240. body 453.091011 2 550 0 412
  241. subject 615.535706 29 584 0 10846
  242.  
  243. "(?i)(?:(?#o-)(?#r-)(?#g-)(?#a-)(?#s-)(?#m-)|(?#e-)(?#r-)(?#e-)(?#c-)(?#t-)(?#i-)(?:(?#o-)(?#n)|(?#l-)(?#e)))"
  244. "Orgasm/erection/erectile"
  245. M
  246. ""
  247. ""
  248. body 632.094648 3 556 0 471
  249. rendering 435.290710 0 14 0 75
  250. subject 1359.969137 33 588 0 11459
  251.  
  252. "(?i)[a-z0-9]{22,}"
  253. "Extremely long words"
  254. M
  255. ""
  256. ""
  257. rendering 1318.454746 6 13 1 71
  258. subject 223.512248 11 588 0 11439
  259.  
  260. "http://[^\020-\0177]+"
  261. "IDN"
  262. M
  263. ""
  264. ""
  265. rendering 458.182531 0 514 0 329
  266.  
  267. "(?i)(?#w-)(?#e-)(?#b-)(?#c-)(?#a-)(?#m-)"
  268. "Webcam"
  269. M
  270. ""
  271. ""
  272. body 171.316381 7 435 0 247
  273. subject 926.780882 2 448 0 5423
  274.  
  275. "(?i)(?#<_)(?:script|object|map)"
  276. "Dangerous tags II"
  277. M
  278. ""
  279. ""
  280. body 1879.464220 1 15 0 142
  281.  
  282. "(?is)(?:(?#h-)(?#o-)(?#u-)(?#s-)(?#e-)(?#w-)(?#i-)(?:(?#v-)(?#e-)?|(?#f-)(?#e-)).+(?#h-)(?#u-)(?#s-)(?#b-)(?#a-)|(?#h-)(?#u-)(?#s-)(?#b-)(?#a-).+(?#h-)(?#o-)(?#u-)(?#s-)(?#e-)(?#w-)(?#i-)(?:(?#v-)(?#e-)(?#s-)|(?#f-)(?#e-)))"
  283. "Housewives and husband"
  284. M
  285. ""
  286. ""
  287. body 432.834316 0 555 0 432
  288. subject 3802.079364 0 586 0 11374
  289.  
  290. "(?i)http://(?:\d+\.\d+\.\d+\.\d+|[^@>\s/]*?@|(?:www\.)?google\.com/url\?|[^>]+[*?]http|\d{8,})"
  291. "Bad URLs/email tracking"
  292. M
  293. ""
  294. ""
  295. body 2096.315968 7 556 1 575
  296.  
  297. "(?i)^[\sa-z]*(?:\[(?:IMG|USEMAP)\][\sa-z]*)+$"
  298. "Nothing but images and/or random words"
  299. M
  300. ""
  301. ""
  302. rendering 1963.272524 0 14 0 75
  303.  
  304. "(?is)(?:(?:[a-z]\s){4,}.+){4,}"
  305. "Space-separated words"
  306. M
  307. ""
  308. ""
  309. body 487.481774 0 555 0 450
  310. rendering 358.747632 0 14 0 75
  311. subject 190.883684 0 585 0 11376
  312.  
  313. "(?i)(?#c-)(?#r-)(?#e-)(?#d-)(?#i-)(?#t-)\s+(?#h-)(?#i-)(?#s-)(?#t-)(?#o-)(?#r-)(?#y-)"
  314. "Credit history"
  315. M
  316. ""
  317. ""
  318. body 6365.812173 2 556 0 472
  319.  
  320. "(?i)(?#s-)(?#t-)(?#o-)(?#c-)(?#k-)"
  321. "Stocks"
  322. M
  323. ""
  324. ""
  325. subject 803.834814 6 64 0 891
  326.  
  327. "(?i)\b(?:(?#c-)(?#l-)(?#i-)(?#c-)(?#k-)|(?#s-)(?#e-)(?#l-)(?#e-)(?#c-)t|(?#p-)(?#r-)(?#e-)(?#s-)(?#s-)|(?#e-)(?#n-)(?#t-)(?#e-)(?#r)|try us|(?#o-)(?#r-)(?#d-)(?#e-)(?#r-))\b\s+(?:\W\s*)?(?:<a[^>]+>)?\s*?(?:(?#h-)(?#e-)(?#r-)(?#e)|(?#b-)(?#e-)(?#l-)(?#o-)w|(?#n-)(?#o-)w)"
  328. "Click/select/press/enter/order here/below"
  329. M
  330. ""
  331. ""
  332. body 18910.591213 66 564 1 703
  333. rendering 263.950796 0 14 0 75
  334.  
  335. "(?is)(?:(?#l-)(?#o-)(?#a-)(?#n-).+(?:(?#d-)(?#e-)(?#b-)(?#t-)|(?#r-)(?#a-)(?#t-)(?#e-))|(?:(?#d-)(?#e-)(?#b-)(?#t-)|(?#r-)(?#a-)(?#t-)(?#e-)).+(?#l-)(?#o-)(?#a-)(?#n-))"
  336. "Loan and debt/rate"
  337. M
  338. ""
  339. ""
  340. body 647.373459 4 556 0 486
  341. subject 1871.004366 2 585 0 11374
  342.  
  343. "(?i)estimate(d).+\b(?:day|month).+target"
  344. "Stock: estimated target"
  345. M
  346. ""
  347. ""
  348. body 817.909693 0 548 0 365
  349.  
  350. "(?i)(?#<_)(?:form[^>]+(?:method|action)|textarea)"
  351. "Form method/textarea"
  352. M
  353. ""
  354. ""
  355. body 2441.176660 0 14 0 94
  356.  
  357. "(?i)(?#<_)img\s+[^>]*(?:low)?src\s*=\s*['"]?\s*cid:"
  358. "Internal images"
  359. M
  360. ""
  361. ""
  362. body 2263.339425 130 14 1 349
  363.  
  364. "(?i)\bIPSI\b"
  365. "Annoying senders"
  366. M
  367. ""
  368. ""
  369. sender 35.207511 0 507 0 9296
  370.  
  371. "(?:DATE_IN_FUTURE|HTML_(?:FONT_INVISIBLE|LINK_CLICK_HERE)|CLICK_BELOW)"
  372. "SpamAssassin rules"
  373. M
  374. ""
  375. ""
  376. headers 261.633792 147 590 0 12926
  377.  
  378. "(?i)microsoft"
  379. "Where don't you want to go today?"
  380. M
  381. ""
  382. ""
  383. subject 55.195302 11 585 1 11531
  384.  
  385. "(?i)(?#t-)(?#h-)(?#i-)(?#s-)\s+(?#i-)(?#s-)\s+(?:(?#a-)(?#n-)?)?(?:\s+\S+)?\s+(?#a-)(?#d-)(?:(?#v-)(?#e-)(?#r-)(?#t-)(?#i-)(?#s-)(?#e-)?(?#m-)(?#e-)(?#n-)(?#t-))?"
  386. "This is an ad"
  387. M
  388. ""
  389. ""
  390. body 10552.825975 0 555 0 450
  391. rendering 169.220423 0 14 0 70
  392.  
  393. "(?is)(\bdebt.*){3,}"
  394. ""Debt" for more than 3 times"
  395. M
  396. ""
  397. ""
  398. body 1752.406652 3 551 0 436
  399.  
  400. "(?is)</html>\s*\S+"
  401. "Stuff beyond </html>"
  402. M
  403. ""
  404. ""
  405. body 1798.656041 27 15 0 212
  406.  
  407. "(?i)(?:sszb\.org|bbhost\.info|idv\.tw|com-click\.com\.ph|(?:global-submit|getpbp|mardox|freebiegazette|forecastmail|(?#v-)(?#i-)(?#c-)(?#t-)(?#o-)(?#r-)(?#y-)(?#e-)(?#x-)(?#c-)(?#h-)(?#a-)(?#n-)(?#g-)(?#e-)|aitalk|new-fields)\. ?(?#c-)(?#o-)(?#m-)|80-20initiative\.net)"
  408. "Other bad sites"
  409. M
  410. ""
  411. ""
  412. body 12664.320146 2 555 1 484
  413.  
  414. "(?i)(?:(?:(?:un|de)-?|out-of-|(?#o-)(?#f-)(?#f-))list|un-subscrib)"
  415. "Unlist/delist/out-of-/off list/un-subscribe"
  416. M
  417. ""
  418. ""
  419. body 3348.575448 2 556 0 502
  420. rendering 2399.388325 0 14 0 75
  421.  
  422. "(?i)(?#l-)(?#i-)(?#f-)(?#e-)\s+(?#i-)(?#n-)(?#s-)(?#u-)(?#r-)(?#a-)(?#n-)(?#c-)(?#e-)"
  423. "Life insurance"
  424. M
  425. ""
  426. ""
  427. body 282.081208 0 555 0 450
  428. subject 1442.126893 29 588 0 11540
  429.  
  430. "(?is)(?#b-)(?#o-)(?#x-)\W{,2}\d\W{,2}\d\W{,2}\d\W{,2}\d\W{,2}\d\W{,2}"
  431. "PO Box address"
  432. M
  433. ""
  434. ""
  435. body 2521.098785 0 555 0 450
  436. rendering 138.020249 0 14 0 75
  437.  
  438. "(?i)(?:<(?:br|/?p)>\s*){5,}"
  439. "5+ consecutive blank lines"
  440. M
  441. ""
  442. ""
  443. body 1266.108618 1 0 0 8
  444.  
  445. "(?i)(?<!~)(?#myNames)(?!@)"
  446. "My names (requires email addr. in Account preference of Mail.app)"
  447. M
  448. ""
  449. ""
  450. rendering 3152.418136 2 14 0 74
  451.  
  452. "(?i)(?:(?:newsletter\.freebiegazette|xadl|aitalk|new-fields)\.com|sszb|80-20\.info)"
  453. "Bad senders"
  454. M
  455. ""
  456. ""
  457. sender 0.000000 0 0 0 0
  458.  
  459. "(?is)(?#c-)(?#h-)(?#e-)(?#a-)(?#t-).+(?#h-)(?#u-)(?#s-)(?#b-)(?#a-)|(?#h-)(?#u-)(?#s-)(?#b-)(?#a-).+(?#c-)(?#h-)(?#e-)(?#a-)(?#t-)"
  460. "Cheat husband"
  461. M
  462. ""
  463. ""
  464. body 558.611340 0 554 0 431
  465. subject 2601.054931 0 585 0 11374
  466.  
  467. "(?i)\.scr$"
  468. "Windoze screensavers"
  469. M
  470. ""
  471. ""
  472. filenames 66.114324 0 3 0 109
  473.  
  474. "(?i)(?:font-size:|(?#<_)font\s+[^> ]*size=)[^"'0-9]*?(?:(?<![1-9])[0-5](?![0-9])(?:px)?|(?<![1-9])[1-5]?\d%)"
  475. "Tiny font"
  476. M
  477. ""
  478. ""
  479. body 6605.154941 0 14 0 94
  480.  
  481. "(?i)call\s+1-?8(?:[\do-]+|88)"
  482. "Call 1-800/888"
  483. M
  484. ""
  485. ""
  486. body 549.606894 0 60 0 27
  487.  
  488. "(?i)(?#e-)(?#j-)(?#a-)(?#c-)(?#u-)(?#l-)"
  489. "Ejaculation"
  490. M
  491. ""
  492. ""
  493. body 336.045904 2 549 0 387
  494. subject 666.929996 1 578 0 10165
  495.  
  496. "(?:E\s*|\n\s*){5,}\S"
  497. "5+ consecutive blank lines"
  498. M
  499. ""
  500. ""
  501. rendering 1156.073147 1 14 0 75
  502.  
  503. "(?i)http://[^> ]+(?:(?#myEmails)|(?#myNames))"
  504. "Tracking my email/name"
  505. M
  506. ""
  507. ""
  508. body 3751.546860 8 552 10 594
  509.  
  510. "(?i)copy.+paste.+(?:url|link)"
  511. "Copy and paste the URL/link"
  512. M
  513. ""
  514. ""
  515. body 605.409270 0 554 0 433
  516.  
  517. "(?i)([a-z0-9]* ){15,}"
  518. "Subject longer than 15 words"
  519. M
  520. ""
  521. ""
  522. subject 252.860634 8 585 0 11523
  523.  
  524. "(?i)(?:(?:(?:(?#l-)(?#o-)(?#o-)?(?#s-)|reduc)(?:(?#e-)|ing)|l(?#o)ss in)\s+(?:(?:body|the)\W+)?(?:(?#w-)(?#e-)(?#i-)(?#g-)(?#h-)(?#t-)|f(?:(?#A-)|(?#a-))t)|(?#w-)(?#e-)(?#i-)(?#g-)(?#h-)(?#t-)\s*(?#l-)(?#o-)(?#s-)(?#s-))"
  525. "Losing/reducing/loss in (body) weight/fat"
  526. M
  527. ""
  528. ""
  529. body 1353.559532 2 556 0 483
  530. rendering 549.398719 0 14 0 70
  531. subject 2898.557443 55 588 0 11564
  532.  
  533. "(?i)(?#1-)(?#0-)(?#0-)%\s+(?#f-)(?#r-)(?#e-)(?#e-)"
  534. "100% Free"
  535. M
  536. ""
  537. ""
  538. body 264.190226 0 59 0 26
  539. subject 929.243475 0 59 0 802
  540.  
  541. "(?i)(?#<_)meta\s+http-equiv\s*="?refresh"
  542. "Site redirect"
  543. M
  544. ""
  545. ""
  546. body 2103.377269 0 14 0 94
  547.  
  548. "(?i)(?:\b(?:(?#v-)(?:(?#i-)|(?#I-))(?:(?#a-)|(?#A-))(?#g-)(?#r-)(?:(?#a-)|(?#A-))|(?#v-)(?:(?#a-)|(?#A-))(?#l-)(?:(?#i-)|(?#I-))(?#u-)m|(?#v-)(?:(?#i-)|(?#I-))(?#c-)(?#o-)(?#d-)(?:(?#i-)|(?#I-))(?#n)|(?#x-)(?:(?#a-)|(?#A-))(?#n-)(?:(?#a-)|(?#A-))x|(?#c-)(?:(?#i-)|(?#I-))(?:(?#a-)|(?#A-))(?#l)(?:(?#i-)|(?#I-))(?#s)|x(?#e-)(?#n-)(?#i-)(?#c-)(?#a-)(?#l-)|(?#u-)(?#l-)(?#t-)(?#r-)(?#a-)(?#m-))\b|(?#v-)(?#i-)(?#o-)(?#x-)|(?#t-)(?#y-)(?#l-)(?#e-)(?#n-))"
  549. "Viagra/valium/vicodin/xanax/cialis/xenical/urltram/violx/tylen"
  550. M
  551. ""
  552. ""
  553. body 2255.796725 26 559 0 678
  554. rendering 766.097830 0 14 0 75
  555. subject 7344.730180 278 588 0 11854
  556.  
  557. "(?i)\b(?:(?#r-)\w?(?#e-)\w?(?#f-)\w?(?#i-)\w?(?#n-)|(?#m-)(?#o-)(?:(?#r-)(?#t-)|(?#t-)(?#r-))(?#g-)|(?:(?#h-)(?#o-)(?#m-)(?#e-)|(?#a-)(?#u-)(?#t-)(?#o-)) ?(?#l-)(?#o-)(?#a-)(?#n))"
  558. "Refin/mortgage/(home/auto loan)"
  559. M
  560. ""
  561. ""
  562. body 908.028723 199 561 0 848
  563. rendering 146.090984 0 13 0 51
  564. subject 2712.912097 269 581 0 10825
  565.  
  566. "(?i)<a\s+href\s*=\s*"http://\S+">.+</a>"
  567. "Href tag"
  568. M
  569. ""
  570. ""
  571. rendering 1901.447072 0 14 0 71
  572. subject 0.000000 0 0 0 0
  573.  
  574. "(?i)(?#<_)table"
  575. "HTML table tag"
  576. M
  577. ""
  578. ""
  579. body 1360.851636 39 13 0 160
  580.  
  581. "(?i)(?:we(?#i)(?#g)ht|f(?#a)t)\s+(?:l(?#o)ss|reduction)"
  582. "Weight/fat loss/reduction"
  583. M
  584. ""
  585. ""
  586. body 434.304087 0 555 0 456
  587. rendering 235.316301 0 14 0 70
  588. subject 618.873008 4 585 0 11390
  589.  
  590. "(?i)\.pif$"
  591. "Windoze .pif files"
  592. M
  593. ""
  594. ""
  595. filenames 57.079894 1 590 0 12924
  596.  
  597. "(?i)(?:st(?#o-)ck|invest(?:ment|or))[\W_]+(?:pick|profile|market watcher|alert)"
  598. "Stocks/investment/investor pick/profile/alert"
  599. M
  600. ""
  601. ""
  602. body 2286.961280 11 559 0 554
  603.  
  604. "^(?:\s*(?i)http://\S+)+$"
  605. "Nothing but an URL"
  606. M
  607. ""
  608. ""
  609. body 607.540140 1 550 0 420
  610.  
  611. "(?i)(?:(?#d-)(?#a-)(?#r-)(?#v-)(?#o-)(?#n-)|(?#z-)(?#y-)(?#r-)(?#t-)(?#e-)(?#c-)|(?#a-)(?#l-)(?#l-)(?#e-)(?#g-)(?#r-)(?#a-)|(?#l-)(?#i-)(?#p-)(?#i-)(?#t-)(?#o-)(?#r-))"
  612. "Darvon, zyrtec, allegra, lipitor"
  613. M
  614. ""
  615. ""
  616. body 1089.515260 0 555 0 450
  617. rendering 1688.204453 0 14 0 75
  618. subject 2887.931903 0 585 0 11376
  619.  
  620. "(?i)\S<font\s+(?:style\s*=\s*"font-size:\s+\dpx"|size\s*=\s*"?\d(?:px)?"?)"
  621. "Stuffing small texts in words"
  622. M
  623. ""
  624. ""
  625. body 3446.708902 100 14 1 241
  626.  
  627. "(?i)(?:cash\s+flow|cc\s+debt|(?#cash))"
  628. "Cash flow/cc debt/cash (obfuscated)"
  629. M
  630. ""
  631. ""
  632. body 2496.302302 2 556 0 487
  633. rendering 276.673405 0 14 0 70
  634.  
  635. "(?i)\.cpl$"
  636. "Windoze control panel stuff?"
  637. M
  638. ""
  639. ""
  640. filenames 29.707297 0 588 0 12922
  641.  
  642. "(?i)(?#<_)(?:i?frame|base|marquee)"
  643. "Dangerous tags I"
  644. M
  645. ""
  646. ""
  647. body 1838.821216 70 15 3 331
  648.  
  649. "^\W?ADV?[ :\W]"
  650. "ADV prefix"
  651. M
  652. ""
  653. ""
  654. subject 82.143163 0 585 0 11485
  655.  
  656. "(?i)(?:(?#F-)(?#D-)(?#A)\s+(?#a-)(?#p-)(?#p-)(?#r-)(?#o-)(?#v-)(?#e-)d|\brx\b)"
  657. "FDA approved/RX"
  658. M
  659. ""
  660. ""
  661. body 521.943738 6 557 1 532
  662. rendering 218.083348 0 14 0 75
  663. subject 1059.619081 28 588 0 11514
  664.  
  665. "(?i)(?#s-)(?#e-)(?#c-)(?#u-)(?#r-)(?#i-)(?#t-)(?#i-)(?#e-)(?#s-)\s+(?:(?#e-)(?#x-)(?#c-)(?#h-)(?#a-)(?#n-)(?#g-)(?#e-)|litigation\s+reform)?\s+(?#a-)(?#c-)(?#t-)"
  666. "Stock news disclaimer II"
  667. M
  668. ""
  669. ""
  670. body 12517.842466 9 559 0 511
  671.  
  672. "(?is)(?:(?#r-)(?#o-)(?#l-)(?#e-)(?#x-)|adobe.+microsoft|microsoft.+adobe|(?:adobe.+){4,}|photoshop.+office|office.+photoshop|c(?#a-)b(?#l-)(?#e-).*f(?#i-)(?#l-)t(?#e-)r|epson.+canon|canon.+epson)"
  673. "Brand names"
  674. M
  675. ""
  676. ""
  677. body 2182.117442 35 562 1 622
  678. rendering 1034.233942 0 14 0 69
  679. subject 1659.657540 91 588 0 11699
  680.  
  681. "(?i)http://[^> ]*\?[^> ]*(?:id|ref)="
  682. "Site tracking"
  683. M
  684. ""
  685. ""
  686. body 1078.278398 50 559 5 709
  687.  
  688. "(?i)(?#p-)(?#r-)(?#e-)(?#a-)(?#p-)(?#p-)(?#r-)(?#o-)(?#v-)(?#e-)(?#d-)"
  689. "Pre-approved"
  690. M
  691. ""
  692. ""
  693. body 179.146120 2 556 0 487
  694. rendering 83.931855 0 14 0 70
  695. subject 976.827091 13 587 0 11416
  696.  
  697. "(?i)^postmaster"
  698. "Bounces etc"
  699. M
  700. ""
  701. ""
  702. sender 0.000000 0 0 0 0
  703.